python3 -m bench --base-url http://127.0.0.1:8000/v1 --model /model/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B -c 256 -t 5000 --numrepeats 3 --output test_out --max_tokens 2048
python3 -m bench --base-url http://127.0.0.1:8000/v1 --model /model/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B -c 512 -t 5000 --numrepeats 3 --output test_out --max_tokens 2048
python3 -m bench --base-url http://127.0.0.1:8000/v1 --model /model/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B -c 1024 -t 5000 --numrepeats 3 --output test_out --max_tokens 2048
